// Copyright (c) 2011 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#include "base/i18n/char_iterator.h"

#include "base/strings/utf_string_conversions.h"
#include "testing/gtest/include/gtest/gtest.h"

namespace base {
namespace i18n {

    TEST(CharIteratorsTest, TestUTF8)
    {
        std::string empty;
        UTF8CharIterator empty_iter(&empty);
        ASSERT_TRUE(empty_iter.end());
        ASSERT_EQ(0, empty_iter.array_pos());
        ASSERT_EQ(0, empty_iter.char_pos());
        ASSERT_FALSE(empty_iter.Advance());

        std::string str("s\303\273r"); // [u with circumflex]
        UTF8CharIterator iter(&str);
        ASSERT_FALSE(iter.end());
        ASSERT_EQ(0, iter.array_pos());
        ASSERT_EQ(0, iter.char_pos());
        ASSERT_EQ('s', iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_FALSE(iter.end());
        ASSERT_EQ(1, iter.array_pos());
        ASSERT_EQ(1, iter.char_pos());
        ASSERT_EQ(251, iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_FALSE(iter.end());
        ASSERT_EQ(3, iter.array_pos());
        ASSERT_EQ(2, iter.char_pos());
        ASSERT_EQ('r', iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_TRUE(iter.end());
        ASSERT_EQ(4, iter.array_pos());
        ASSERT_EQ(3, iter.char_pos());

        // Don't care what it returns, but this shouldn't crash
        iter.get();

        ASSERT_FALSE(iter.Advance());
    }

    TEST(CharIteratorsTest, TestUTF16)
    {
        string16 empty = UTF8ToUTF16("");
        UTF16CharIterator empty_iter(&empty);
        ASSERT_TRUE(empty_iter.end());
        ASSERT_EQ(0, empty_iter.array_pos());
        ASSERT_EQ(0, empty_iter.char_pos());
        ASSERT_FALSE(empty_iter.Advance());

        // This test string contains 4 characters:
        //   x
        //   u with circumflex - 2 bytes in UTF8, 1 codeword in UTF16
        //   math double-struck A - 4 bytes in UTF8, 2 codewords in UTF16
        //   z
        string16 str = UTF8ToUTF16("x\303\273\360\235\224\270z");
        UTF16CharIterator iter(&str);
        ASSERT_FALSE(iter.end());
        ASSERT_EQ(0, iter.array_pos());
        ASSERT_EQ(0, iter.char_pos());
        ASSERT_EQ('x', iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_FALSE(iter.end());
        ASSERT_EQ(1, iter.array_pos());
        ASSERT_EQ(1, iter.char_pos());
        ASSERT_EQ(251, iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_FALSE(iter.end());
        ASSERT_EQ(2, iter.array_pos());
        ASSERT_EQ(2, iter.char_pos());
        ASSERT_EQ(120120, iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_FALSE(iter.end());
        ASSERT_EQ(4, iter.array_pos());
        ASSERT_EQ(3, iter.char_pos());
        ASSERT_EQ('z', iter.get());
        ASSERT_TRUE(iter.Advance());

        ASSERT_TRUE(iter.end());
        ASSERT_EQ(5, iter.array_pos());
        ASSERT_EQ(4, iter.char_pos());

        // Don't care what it returns, but this shouldn't crash
        iter.get();

        ASSERT_FALSE(iter.Advance());
    }

} // namespace i18n
} // namespace base
